PER_INTERNAL_OP(composite_extract_0)
PER_INTERNAL_OP(composite_extract_1)
PER_INTERNAL_OP(composite_extract_2)
PER_INTERNAL_OP(composite_extract_3)

PER_INTERNAL_OP(insert_triplet_f32)
PER_INTERNAL_OP(insert_triplet_f64)

PER_INTERNAL_OP(linear_thread_idx)

PER_INTERNAL_OP(test_stack)
PER_INTERNAL_OP(test_active_mask)
PER_INTERNAL_OP(test_shfl)
PER_INTERNAL_OP(test_list_manager)
PER_INTERNAL_OP(test_node_allocator)
PER_INTERNAL_OP(test_node_allocator_gc_cpu)
PER_INTERNAL_OP(do_nothing)
PER_INTERNAL_OP(refresh_counter)
PER_INTERNAL_OP(test_internal_func_args)

// Vulkan
PER_INTERNAL_OP(workgroupBarrier)
PER_INTERNAL_OP(workgroupMemoryBarrier)
PER_INTERNAL_OP(localInvocationId)
PER_INTERNAL_OP(vkGlobalThreadIdx)
PER_INTERNAL_OP(subgroupBarrier)
PER_INTERNAL_OP(subgroupMemoryBarrier)
PER_INTERNAL_OP(subgroupElect)
PER_INTERNAL_OP(subgroupBroadcast)
PER_INTERNAL_OP(subgroupSize)
PER_INTERNAL_OP(subgroupInvocationId)
PER_INTERNAL_OP(subgroupAdd)
PER_INTERNAL_OP(subgroupMul)
PER_INTERNAL_OP(subgroupMin)
PER_INTERNAL_OP(subgroupMax)
PER_INTERNAL_OP(subgroupAnd)
PER_INTERNAL_OP(subgroupOr)
PER_INTERNAL_OP(subgroupXor)
PER_INTERNAL_OP(subgroupInclusiveAdd)
PER_INTERNAL_OP(subgroupInclusiveMul)
PER_INTERNAL_OP(subgroupInclusiveMin)
PER_INTERNAL_OP(subgroupInclusiveMax)
PER_INTERNAL_OP(subgroupInclusiveAnd)
PER_INTERNAL_OP(subgroupInclusiveOr)
PER_INTERNAL_OP(subgroupInclusiveXor)

// CUDA
PER_INTERNAL_OP(block_barrier)
PER_INTERNAL_OP(grid_memfence)
PER_INTERNAL_OP(cuda_all_sync_i32)
PER_INTERNAL_OP(cuda_any_sync_i32)
PER_INTERNAL_OP(cuda_uni_sync_i32)
PER_INTERNAL_OP(cuda_ballot_i32)
PER_INTERNAL_OP(cuda_shfl_sync_i32)
PER_INTERNAL_OP(cuda_shfl_sync_f32)
PER_INTERNAL_OP(cuda_shfl_up_sync_i32)
PER_INTERNAL_OP(cuda_shfl_up_sync_f32)
PER_INTERNAL_OP(cuda_shfl_down_sync_i32)
PER_INTERNAL_OP(cuda_shfl_down_sync_f32)
PER_INTERNAL_OP(cuda_shfl_xor_sync_i32)
PER_INTERNAL_OP(cuda_match_any_sync_i32)
PER_INTERNAL_OP(cuda_match_all_sync_i32)
PER_INTERNAL_OP(cuda_active_mask)
PER_INTERNAL_OP(warp_barrier)
